{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import warnings\n",
    "warnings.filterwarnings(\"ignore\")\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn\n",
    "import pyecharts\n",
    "from collections import Counter"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>jobId</th>\n",
       "      <th>updateTime</th>\n",
       "      <th>willNature</th>\n",
       "      <th>positionName</th>\n",
       "      <th>minimumWage</th>\n",
       "      <th>maximumWage</th>\n",
       "      <th>exp</th>\n",
       "      <th>educationalRequirements</th>\n",
       "      <th>count</th>\n",
       "      <th>enterpriseId</th>\n",
       "      <th>jobRequiredments</th>\n",
       "      <th>welfare</th>\n",
       "      <th>workplace</th>\n",
       "      <th>deadline</th>\n",
       "      <th>function</th>\n",
       "      <th>enterpriseName</th>\n",
       "      <th>keywordList</th>\n",
       "      <th>skillsList</th>\n",
       "      <th>resumeCount</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1631112859985510400</td>\n",
       "      <td>2023-03-02 10:03</td>\n",
       "      <td>全职</td>\n",
       "      <td>会计实习生</td>\n",
       "      <td>3500.0</td>\n",
       "      <td>7000.0</td>\n",
       "      <td>0</td>\n",
       "      <td>大专</td>\n",
       "      <td>2</td>\n",
       "      <td>1507192012301008896</td>\n",
       "      <td>1. 深入了解区域项目，搭建项目概算模板； \\n\\n2. 负责中小项目的项目概算工作； \\n...</td>\n",
       "      <td>餐饮补贴|专业培训|弹性工作</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2024-01-01 00:00</td>\n",
       "      <td>财务实习生</td>\n",
       "      <td>深圳市海柔创新科技有限公司</td>\n",
       "      <td>互联网| 人工智能</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1631112859897430016</td>\n",
       "      <td>2023-03-02 10:03</td>\n",
       "      <td>全职</td>\n",
       "      <td>技术服务工程师</td>\n",
       "      <td>5000.0</td>\n",
       "      <td>10000.0</td>\n",
       "      <td>0</td>\n",
       "      <td>大专</td>\n",
       "      <td>5</td>\n",
       "      <td>1507192012301008896</td>\n",
       "      <td>工作职责\\n\\n1、负责客户项目交付后的运维工作，协助售后服务工程师支持客户现场业务操作，现...</td>\n",
       "      <td>餐饮补贴|专业培训|弹性工作</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2023-12-31 00:00</td>\n",
       "      <td>技术支持工程师</td>\n",
       "      <td>深圳市海柔创新科技有限公司</td>\n",
       "      <td>互联网| 人工智能</td>\n",
       "      <td>NaN</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1629824814967554048</td>\n",
       "      <td>2023-02-26 20:44</td>\n",
       "      <td>全职</td>\n",
       "      <td>大数据分析师（BI）</td>\n",
       "      <td>4500.0</td>\n",
       "      <td>7000.0</td>\n",
       "      <td>0</td>\n",
       "      <td>本科</td>\n",
       "      <td>1</td>\n",
       "      <td>1629824703571034112</td>\n",
       "      <td>岗位要求：\\n(1) 大学本科及以上学历，计算机、数学相关专业；\\n(2) 熟悉SQL、SA...</td>\n",
       "      <td>餐饮补贴|专业培训|弹性工作</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2023-12-31 00:00</td>\n",
       "      <td>大数据分析师</td>\n",
       "      <td>广州太普软件科技有限公司</td>\n",
       "      <td>互联网| 软件</td>\n",
       "      <td>NaN</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1613439889204969472</td>\n",
       "      <td>2023-01-12 15:37</td>\n",
       "      <td>实习</td>\n",
       "      <td>自然语言处理工程师</td>\n",
       "      <td>2000.0</td>\n",
       "      <td>4000.0</td>\n",
       "      <td>0</td>\n",
       "      <td>本科</td>\n",
       "      <td>0</td>\n",
       "      <td>1613428212640120832</td>\n",
       "      <td>【岗位职责】\\n1.根据业务需求，负责自然语言处理方向的算法研究、产品开发和性能提升。 \\n...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2029-01-01 00:00</td>\n",
       "      <td>其他</td>\n",
       "      <td>广州奇之信息技术有限公司</td>\n",
       "      <td>自然语言</td>\n",
       "      <td>算法研究| 深度学习</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1613439536044572672</td>\n",
       "      <td>2023-01-12 15:35</td>\n",
       "      <td>实习</td>\n",
       "      <td>爬虫工程师</td>\n",
       "      <td>2000.0</td>\n",
       "      <td>4000.0</td>\n",
       "      <td>0</td>\n",
       "      <td>本科</td>\n",
       "      <td>0</td>\n",
       "      <td>1613428212640120832</td>\n",
       "      <td>【岗位要求】\\n1.精通python编程语言\\n2.熟练掌握常用的爬虫框架，如scrapy、...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2029-01-01 00:00</td>\n",
       "      <td>其他</td>\n",
       "      <td>广州奇之信息技术有限公司</td>\n",
       "      <td>Python| 爬虫框架</td>\n",
       "      <td>Python| 爬虫框架| 数据采集</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1563</th>\n",
       "      <td>1462710211658776576</td>\n",
       "      <td>2021-12-08 11:16</td>\n",
       "      <td>全职</td>\n",
       "      <td>体验顾问</td>\n",
       "      <td>7000.0</td>\n",
       "      <td>12000.0</td>\n",
       "      <td>0</td>\n",
       "      <td>本科</td>\n",
       "      <td>50</td>\n",
       "      <td>1462687986234818560</td>\n",
       "      <td>岗位职责：\\n1、大专/本科及以上学历； \\n2、优秀的客户服务意识，热爱消费电子行业 ； ...</td>\n",
       "      <td>五险一金|出国机会|绩效奖金|免费班车|员工旅游|年终奖金|交通补贴|股票期权|餐饮补贴|弹...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2021-12-08 11:15</td>\n",
       "      <td>其他</td>\n",
       "      <td>华为慧通商务有限公司</td>\n",
       "      <td>客户服务| 消费电子| 零售服务| 华为产品</td>\n",
       "      <td>产品运营| 项目管理| 数据通信</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1564</th>\n",
       "      <td>1462698431867912192</td>\n",
       "      <td>2021-12-08 11:15</td>\n",
       "      <td>全职</td>\n",
       "      <td>Python爬虫工程师</td>\n",
       "      <td>8000.0</td>\n",
       "      <td>10000.0</td>\n",
       "      <td>0</td>\n",
       "      <td>本科</td>\n",
       "      <td>0</td>\n",
       "      <td>1462687572705804288</td>\n",
       "      <td>岗位职责：\\n1.1年以上爬虫经验；全日制大专及以上学历； \\n2. 熟练掌握python开...</td>\n",
       "      <td>五险一金|出国机会|免费班车|绩效奖金|员工旅游|年终奖金|交通补贴|股票期权|餐饮补贴|弹...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2021-12-08 11:14</td>\n",
       "      <td>算法工程师</td>\n",
       "      <td>深圳达普信科技有限公司</td>\n",
       "      <td>Python开发| css| SQL</td>\n",
       "      <td>数据探索| 数据查询| 数据建模| 数据计算| 数据预处理</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1565</th>\n",
       "      <td>1461590578927108096</td>\n",
       "      <td>2021-12-08 11:14</td>\n",
       "      <td>全职</td>\n",
       "      <td>数据分析</td>\n",
       "      <td>6000.0</td>\n",
       "      <td>10000.0</td>\n",
       "      <td>0</td>\n",
       "      <td>本科</td>\n",
       "      <td>0</td>\n",
       "      <td>1461581470710759424</td>\n",
       "      <td>岗位职责：\\n1、根据指定业务场景进行数据分析，撰写分析报告。 \\n2、基于历史数据与实操经...</td>\n",
       "      <td>五险一金|出国机会|免费班车|绩效奖金|员工旅游|年终奖金|交通补贴|股票期权|餐饮补贴|弹...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2021-12-08 11:13</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>上海众言网络科技有限公司</td>\n",
       "      <td>数据分析| 大数据分析| 人工智能| SPSS| 数学建模</td>\n",
       "      <td>数据探索| 数据通信| 数据分析| 数据查询| 数据建模</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1566</th>\n",
       "      <td>1461591923750993920</td>\n",
       "      <td>2021-12-08 11:14</td>\n",
       "      <td>全职</td>\n",
       "      <td>数据分析工程师</td>\n",
       "      <td>7000.0</td>\n",
       "      <td>10000.0</td>\n",
       "      <td>0</td>\n",
       "      <td>本科</td>\n",
       "      <td>0</td>\n",
       "      <td>1461581470710759424</td>\n",
       "      <td>岗位职责：\\n1、根据论文、文献标准化各类教学模型的输入输出，产出数学模型分析模板原型，形成...</td>\n",
       "      <td>五险一金|免费班车|员工旅游|交通补贴|餐饮补贴|通讯补贴|专业培训|定期体检|弹性工作|股...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2021-12-08 11:13</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>上海众言网络科技有限公司</td>\n",
       "      <td>数据分析| 大数据分析| 人工智能| 产品发布| 产品设计</td>\n",
       "      <td>数据探索| 数据采集| 数据查询| 数据分析| 数据计算</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1567</th>\n",
       "      <td>1461593160642854912</td>\n",
       "      <td>2021-12-08 11:13</td>\n",
       "      <td>全职</td>\n",
       "      <td>大数据开发工程师</td>\n",
       "      <td>7000.0</td>\n",
       "      <td>12000.0</td>\n",
       "      <td>0</td>\n",
       "      <td>本科</td>\n",
       "      <td>0</td>\n",
       "      <td>1461581151616499712</td>\n",
       "      <td>岗位职责：\\n1.本科及以上学历，计算机类相关专业，有相关程序开发经验； \\n2、熟悉一门高...</td>\n",
       "      <td>五险一金|出国机会|免费班车|绩效奖金|员工旅游|年终奖金|交通补贴|股票期权|餐饮补贴|弹...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2021-12-08 11:12</td>\n",
       "      <td>算法工程师</td>\n",
       "      <td>深圳市明源云客电子商务有限公司</td>\n",
       "      <td>数据分析| 数据开发| Scala| Python</td>\n",
       "      <td>数据探索| 数据查询| 数据建模| 数据计算| 数据预处理</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1568 rows × 19 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    jobId        updateTime willNature positionName  \\\n",
       "0     1631112859985510400  2023-03-02 10:03         全职        会计实习生   \n",
       "1     1631112859897430016  2023-03-02 10:03         全职      技术服务工程师   \n",
       "2     1629824814967554048  2023-02-26 20:44         全职   大数据分析师（BI）   \n",
       "3     1613439889204969472  2023-01-12 15:37         实习    自然语言处理工程师   \n",
       "4     1613439536044572672  2023-01-12 15:35         实习        爬虫工程师   \n",
       "...                   ...               ...        ...          ...   \n",
       "1563  1462710211658776576  2021-12-08 11:16         全职         体验顾问   \n",
       "1564  1462698431867912192  2021-12-08 11:15         全职  Python爬虫工程师   \n",
       "1565  1461590578927108096  2021-12-08 11:14         全职         数据分析   \n",
       "1566  1461591923750993920  2021-12-08 11:14         全职      数据分析工程师   \n",
       "1567  1461593160642854912  2021-12-08 11:13         全职     大数据开发工程师   \n",
       "\n",
       "      minimumWage  maximumWage  exp educationalRequirements  count  \\\n",
       "0          3500.0       7000.0    0                      大专      2   \n",
       "1          5000.0      10000.0    0                      大专      5   \n",
       "2          4500.0       7000.0    0                      本科      1   \n",
       "3          2000.0       4000.0    0                      本科      0   \n",
       "4          2000.0       4000.0    0                      本科      0   \n",
       "...           ...          ...  ...                     ...    ...   \n",
       "1563       7000.0      12000.0    0                      本科     50   \n",
       "1564       8000.0      10000.0    0                      本科      0   \n",
       "1565       6000.0      10000.0    0                      本科      0   \n",
       "1566       7000.0      10000.0    0                      本科      0   \n",
       "1567       7000.0      12000.0    0                      本科      0   \n",
       "\n",
       "             enterpriseId                                   jobRequiredments  \\\n",
       "0     1507192012301008896  1. 深入了解区域项目，搭建项目概算模板； \\n\\n2. 负责中小项目的项目概算工作； \\n...   \n",
       "1     1507192012301008896  工作职责\\n\\n1、负责客户项目交付后的运维工作，协助售后服务工程师支持客户现场业务操作，现...   \n",
       "2     1629824703571034112  岗位要求：\\n(1) 大学本科及以上学历，计算机、数学相关专业；\\n(2) 熟悉SQL、SA...   \n",
       "3     1613428212640120832  【岗位职责】\\n1.根据业务需求，负责自然语言处理方向的算法研究、产品开发和性能提升。 \\n...   \n",
       "4     1613428212640120832  【岗位要求】\\n1.精通python编程语言\\n2.熟练掌握常用的爬虫框架，如scrapy、...   \n",
       "...                   ...                                                ...   \n",
       "1563  1462687986234818560  岗位职责：\\n1、大专/本科及以上学历； \\n2、优秀的客户服务意识，热爱消费电子行业 ； ...   \n",
       "1564  1462687572705804288  岗位职责：\\n1.1年以上爬虫经验；全日制大专及以上学历； \\n2. 熟练掌握python开...   \n",
       "1565  1461581470710759424  岗位职责：\\n1、根据指定业务场景进行数据分析，撰写分析报告。 \\n2、基于历史数据与实操经...   \n",
       "1566  1461581470710759424  岗位职责：\\n1、根据论文、文献标准化各类教学模型的输入输出，产出数学模型分析模板原型，形成...   \n",
       "1567  1461581151616499712  岗位职责：\\n1.本科及以上学历，计算机类相关专业，有相关程序开发经验； \\n2、熟悉一门高...   \n",
       "\n",
       "                                                welfare workplace  \\\n",
       "0                                        餐饮补贴|专业培训|弹性工作       NaN   \n",
       "1                                        餐饮补贴|专业培训|弹性工作       NaN   \n",
       "2                                        餐饮补贴|专业培训|弹性工作       NaN   \n",
       "3                                                   NaN       NaN   \n",
       "4                                                   NaN       NaN   \n",
       "...                                                 ...       ...   \n",
       "1563  五险一金|出国机会|绩效奖金|免费班车|员工旅游|年终奖金|交通补贴|股票期权|餐饮补贴|弹...       NaN   \n",
       "1564  五险一金|出国机会|免费班车|绩效奖金|员工旅游|年终奖金|交通补贴|股票期权|餐饮补贴|弹...       NaN   \n",
       "1565  五险一金|出国机会|免费班车|绩效奖金|员工旅游|年终奖金|交通补贴|股票期权|餐饮补贴|弹...       NaN   \n",
       "1566  五险一金|免费班车|员工旅游|交通补贴|餐饮补贴|通讯补贴|专业培训|定期体检|弹性工作|股...       NaN   \n",
       "1567  五险一金|出国机会|免费班车|绩效奖金|员工旅游|年终奖金|交通补贴|股票期权|餐饮补贴|弹...       NaN   \n",
       "\n",
       "              deadline function   enterpriseName  \\\n",
       "0     2024-01-01 00:00    财务实习生    深圳市海柔创新科技有限公司   \n",
       "1     2023-12-31 00:00  技术支持工程师    深圳市海柔创新科技有限公司   \n",
       "2     2023-12-31 00:00   大数据分析师     广州太普软件科技有限公司   \n",
       "3     2029-01-01 00:00       其他     广州奇之信息技术有限公司   \n",
       "4     2029-01-01 00:00       其他     广州奇之信息技术有限公司   \n",
       "...                ...      ...              ...   \n",
       "1563  2021-12-08 11:15       其他       华为慧通商务有限公司   \n",
       "1564  2021-12-08 11:14    算法工程师      深圳达普信科技有限公司   \n",
       "1565  2021-12-08 11:13    数据分析师     上海众言网络科技有限公司   \n",
       "1566  2021-12-08 11:13    数据分析师     上海众言网络科技有限公司   \n",
       "1567  2021-12-08 11:12    算法工程师  深圳市明源云客电子商务有限公司   \n",
       "\n",
       "                        keywordList                     skillsList  \\\n",
       "0                         互联网| 人工智能                            NaN   \n",
       "1                         互联网| 人工智能                            NaN   \n",
       "2                           互联网| 软件                            NaN   \n",
       "3                              自然语言                     算法研究| 深度学习   \n",
       "4                      Python| 爬虫框架             Python| 爬虫框架| 数据采集   \n",
       "...                             ...                            ...   \n",
       "1563         客户服务| 消费电子| 零售服务| 华为产品               产品运营| 项目管理| 数据通信   \n",
       "1564             Python开发| css| SQL  数据探索| 数据查询| 数据建模| 数据计算| 数据预处理   \n",
       "1565  数据分析| 大数据分析| 人工智能| SPSS| 数学建模   数据探索| 数据通信| 数据分析| 数据查询| 数据建模   \n",
       "1566  数据分析| 大数据分析| 人工智能| 产品发布| 产品设计   数据探索| 数据采集| 数据查询| 数据分析| 数据计算   \n",
       "1567      数据分析| 数据开发| Scala| Python  数据探索| 数据查询| 数据建模| 数据计算| 数据预处理   \n",
       "\n",
       "      resumeCount  \n",
       "0               2  \n",
       "1               4  \n",
       "2               4  \n",
       "3               4  \n",
       "4               1  \n",
       "...           ...  \n",
       "1563            0  \n",
       "1564            0  \n",
       "1565            1  \n",
       "1566            0  \n",
       "1567            3  \n",
       "\n",
       "[1568 rows x 19 columns]"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "Job = pd.read_csv(\"../Data/ProcessData/Job.csv\")\n",
    "JobDetail = pd.read_csv(\"../Data/ProcessData/JobDetail.csv\")\n",
    "data = Job.merge(JobDetail)\n",
    "data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array(['餐饮补贴|专业培训|弹性工作', '餐饮补贴|专业培训|弹性工作', '餐饮补贴|专业培训|弹性工作', ...,\n",
       "       '五险一金|出国机会|免费班车|绩效奖金|员工旅游|年终奖金|交通补贴|股票期权|餐饮补贴|弹性工作|通讯补贴|定期体检|专业培训',\n",
       "       '五险一金|免费班车|员工旅游|交通补贴|餐饮补贴|通讯补贴|专业培训|定期体检|弹性工作|股票期权|年终奖金|绩效奖金|出国机会',\n",
       "       '五险一金|出国机会|免费班车|绩效奖金|员工旅游|年终奖金|交通补贴|股票期权|餐饮补贴|弹性工作|通讯补贴|定期体检|专业培训'],\n",
       "      dtype=object)"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "SalaryTreatment = data[['maximumWage','minimumWage','welfare']]\n",
    "SalaryTreatment['welfare'].values"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [],
   "source": [
    "welfareCount = Counter([word for line in [i.split(\"|\") for i in SalaryTreatment['welfare'] if isinstance(i,str)] for word in line])\n",
    "welfareCount = list(welfareCount.items())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>resumeId</th>\n",
       "      <th>username</th>\n",
       "      <th>gender</th>\n",
       "      <th>jobStatus</th>\n",
       "      <th>exp</th>\n",
       "      <th>expectPosition</th>\n",
       "      <th>willSalaryStart</th>\n",
       "      <th>willSalaryEnd</th>\n",
       "      <th>updateTime</th>\n",
       "      <th>province</th>\n",
       "      <th>...</th>\n",
       "      <th>学校1</th>\n",
       "      <th>专业1</th>\n",
       "      <th>学位1</th>\n",
       "      <th>起始时间1</th>\n",
       "      <th>毕业时间1</th>\n",
       "      <th>学校2</th>\n",
       "      <th>专业2</th>\n",
       "      <th>学位2</th>\n",
       "      <th>起始时间2</th>\n",
       "      <th>毕业时间2</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1635610357617786880</td>\n",
       "      <td>欧先生</td>\n",
       "      <td>男</td>\n",
       "      <td>毕业找工作</td>\n",
       "      <td>0</td>\n",
       "      <td>数据分析师|数据挖掘工程师|算法工程师</td>\n",
       "      <td>3000</td>\n",
       "      <td>4000</td>\n",
       "      <td>2023-03-14</td>\n",
       "      <td>广东省</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1634019092572798976</td>\n",
       "      <td>赖女士</td>\n",
       "      <td>女</td>\n",
       "      <td>毕业找工作</td>\n",
       "      <td>0</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>4000</td>\n",
       "      <td>5000</td>\n",
       "      <td>2023-03-10</td>\n",
       "      <td>江苏省</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1630818546172952576</td>\n",
       "      <td>陈先生</td>\n",
       "      <td>男</td>\n",
       "      <td>毕业找工作</td>\n",
       "      <td>0</td>\n",
       "      <td>数据分析师|数据挖掘工程师|算法工程师</td>\n",
       "      <td>6000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2023-03-01</td>\n",
       "      <td>广东省</td>\n",
       "      <td>...</td>\n",
       "      <td>韩山师范学院</td>\n",
       "      <td>统计学</td>\n",
       "      <td>本科</td>\n",
       "      <td>2019-09-15</td>\n",
       "      <td>2023-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1630884821167374336</td>\n",
       "      <td>李女士</td>\n",
       "      <td>女</td>\n",
       "      <td>无明确就业状态</td>\n",
       "      <td>1</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>5000</td>\n",
       "      <td>8000</td>\n",
       "      <td>2023-03-01</td>\n",
       "      <td>广东省</td>\n",
       "      <td>...</td>\n",
       "      <td>韶关学院</td>\n",
       "      <td>应用统计学</td>\n",
       "      <td>本科</td>\n",
       "      <td>2019-03-09</td>\n",
       "      <td>2023-03-06</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1582598236647063552</td>\n",
       "      <td>黄先生</td>\n",
       "      <td>男</td>\n",
       "      <td>毕业找工作</td>\n",
       "      <td>1</td>\n",
       "      <td>数据分析师|数据挖掘工程师|机器学习工程师</td>\n",
       "      <td>8000</td>\n",
       "      <td>12000</td>\n",
       "      <td>2022-10-19</td>\n",
       "      <td>广东省</td>\n",
       "      <td>...</td>\n",
       "      <td>韩山师范学院</td>\n",
       "      <td>统计学</td>\n",
       "      <td>本科</td>\n",
       "      <td>2019-09-15</td>\n",
       "      <td>2023-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16136</th>\n",
       "      <td>7539911453372509716</td>\n",
       "      <td>陈先生</td>\n",
       "      <td>男</td>\n",
       "      <td>毕业找工作</td>\n",
       "      <td>0</td>\n",
       "      <td>数据分析师|数据挖掘工程师</td>\n",
       "      <td>4000</td>\n",
       "      <td>6000</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16137</th>\n",
       "      <td>7539911474847346196</td>\n",
       "      <td>易女士</td>\n",
       "      <td>女</td>\n",
       "      <td>毕业找工作</td>\n",
       "      <td>0</td>\n",
       "      <td>数据分析师|数据挖掘工程师</td>\n",
       "      <td>4000</td>\n",
       "      <td>6000</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16138</th>\n",
       "      <td>7539911492027215380</td>\n",
       "      <td>李女士</td>\n",
       "      <td>女</td>\n",
       "      <td>毕业找工作</td>\n",
       "      <td>0</td>\n",
       "      <td>数据分析师|数据挖掘工程师</td>\n",
       "      <td>4000</td>\n",
       "      <td>6000</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16139</th>\n",
       "      <td>7539911483437280788</td>\n",
       "      <td>林女士</td>\n",
       "      <td>女</td>\n",
       "      <td>毕业找工作</td>\n",
       "      <td>0</td>\n",
       "      <td>数据分析师|数据挖掘工程师</td>\n",
       "      <td>4000</td>\n",
       "      <td>6000</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16140</th>\n",
       "      <td>7539911500617149972</td>\n",
       "      <td>范先生</td>\n",
       "      <td>男</td>\n",
       "      <td>毕业找工作</td>\n",
       "      <td>0</td>\n",
       "      <td>数据分析师|数据挖掘工程师</td>\n",
       "      <td>4000</td>\n",
       "      <td>6000</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>16141 rows × 37 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                  resumeId username gender jobStatus  exp  \\\n",
       "0      1635610357617786880      欧先生      男     毕业找工作    0   \n",
       "1      1634019092572798976      赖女士      女     毕业找工作    0   \n",
       "2      1630818546172952576      陈先生      男     毕业找工作    0   \n",
       "3      1630884821167374336      李女士      女   无明确就业状态    1   \n",
       "4      1582598236647063552      黄先生      男     毕业找工作    1   \n",
       "...                    ...      ...    ...       ...  ...   \n",
       "16136  7539911453372509716      陈先生      男     毕业找工作    0   \n",
       "16137  7539911474847346196      易女士      女     毕业找工作    0   \n",
       "16138  7539911492027215380      李女士      女     毕业找工作    0   \n",
       "16139  7539911483437280788      林女士      女     毕业找工作    0   \n",
       "16140  7539911500617149972      范先生      男     毕业找工作    0   \n",
       "\n",
       "              expectPosition  willSalaryStart  willSalaryEnd  updateTime  \\\n",
       "0        数据分析师|数据挖掘工程师|算法工程师             3000           4000  2023-03-14   \n",
       "1                      数据分析师             4000           5000  2023-03-10   \n",
       "2        数据分析师|数据挖掘工程师|算法工程师             6000           8000  2023-03-01   \n",
       "3                      数据分析师             5000           8000  2023-03-01   \n",
       "4      数据分析师|数据挖掘工程师|机器学习工程师             8000          12000  2022-10-19   \n",
       "...                      ...              ...            ...         ...   \n",
       "16136          数据分析师|数据挖掘工程师             4000           6000         NaN   \n",
       "16137          数据分析师|数据挖掘工程师             4000           6000         NaN   \n",
       "16138          数据分析师|数据挖掘工程师             4000           6000         NaN   \n",
       "16139          数据分析师|数据挖掘工程师             4000           6000         NaN   \n",
       "16140          数据分析师|数据挖掘工程师             4000           6000         NaN   \n",
       "\n",
       "      province  ...     学校1    专业1  学位1       起始时间1       毕业时间1  学校2  专业2  \\\n",
       "0          广东省  ...     NaN    NaN  NaN         NaN         NaN  NaN  NaN   \n",
       "1          江苏省  ...     NaN    NaN  NaN         NaN         NaN  NaN  NaN   \n",
       "2          广东省  ...  韩山师范学院    统计学   本科  2019-09-15  2023-06-30  NaN  NaN   \n",
       "3          广东省  ...    韶关学院  应用统计学   本科  2019-03-09  2023-03-06  NaN  NaN   \n",
       "4          广东省  ...  韩山师范学院    统计学   本科  2019-09-15  2023-06-15  NaN  NaN   \n",
       "...        ...  ...     ...    ...  ...         ...         ...  ...  ...   \n",
       "16136      NaN  ...     NaN    NaN  NaN         NaN         NaN  NaN  NaN   \n",
       "16137      NaN  ...     NaN    NaN  NaN         NaN         NaN  NaN  NaN   \n",
       "16138      NaN  ...     NaN    NaN  NaN         NaN         NaN  NaN  NaN   \n",
       "16139      NaN  ...     NaN    NaN  NaN         NaN         NaN  NaN  NaN   \n",
       "16140      NaN  ...     NaN    NaN  NaN         NaN         NaN  NaN  NaN   \n",
       "\n",
       "       学位2 起始时间2 毕业时间2  \n",
       "0      NaN   NaN   NaN  \n",
       "1      NaN   NaN   NaN  \n",
       "2      NaN   NaN   NaN  \n",
       "3      NaN   NaN   NaN  \n",
       "4      NaN   NaN   NaN  \n",
       "...    ...   ...   ...  \n",
       "16136  NaN   NaN   NaN  \n",
       "16137  NaN   NaN   NaN  \n",
       "16138  NaN   NaN   NaN  \n",
       "16139  NaN   NaN   NaN  \n",
       "16140  NaN   NaN   NaN  \n",
       "\n",
       "[16141 rows x 37 columns]"
      ]
     },
     "execution_count": 50,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "People = pd.read_csv(\"../Data/ProcessData/People.csv\")\n",
    "PeopleDetail = pd.read_csv(\"../Data/ProcessData/PeopleDetail.csv\")\n",
    "data = People.merge(PeopleDetail)\n",
    "data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Index(['resumeId', 'username', 'gender', 'jobStatus', 'exp', 'expectPosition',\n",
       "       'willSalaryStart', 'willSalaryEnd', 'updateTime', 'province', 'city',\n",
       "       'region', 'birthday', 'arrivalTime', 'politicalStatus',\n",
       "       'selfEvaluation', 'expectIndustry', 'willNature', 'keywordList',\n",
       "       'projectExperienceList', 'competitionExperienceList',\n",
       "       'trainingExperienceList', 'skillList', 'languageList', 'certList',\n",
       "       'workExperienceList', 'age', '学校1', '专业1', '学位1', '起始时间1', '毕业时间1',\n",
       "       '学校2', '专业2', '学位2', '起始时间2', '毕业时间2'],\n",
       "      dtype='object')"
      ]
     },
     "execution_count": 52,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "data.columns"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>resumeId</th>\n",
       "      <th>birthday</th>\n",
       "      <th>arrivalTime</th>\n",
       "      <th>politicalStatus</th>\n",
       "      <th>selfEvaluation</th>\n",
       "      <th>expectIndustry</th>\n",
       "      <th>willNature</th>\n",
       "      <th>keywordList</th>\n",
       "      <th>projectExperienceList</th>\n",
       "      <th>competitionExperienceList</th>\n",
       "      <th>...</th>\n",
       "      <th>学校1</th>\n",
       "      <th>专业1</th>\n",
       "      <th>学位1</th>\n",
       "      <th>起始时间1</th>\n",
       "      <th>毕业时间1</th>\n",
       "      <th>学校2</th>\n",
       "      <th>专业2</th>\n",
       "      <th>学位2</th>\n",
       "      <th>起始时间2</th>\n",
       "      <th>毕业时间2</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1637801716407730176</td>\n",
       "      <td>2019-03-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>中共预备党员</td>\n",
       "      <td>啥都会</td>\n",
       "      <td>NaN</td>\n",
       "      <td>全职</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1635610357617786880</td>\n",
       "      <td>2002-03-02</td>\n",
       "      <td>时间待议</td>\n",
       "      <td>团员</td>\n",
       "      <td>Python 数据分析</td>\n",
       "      <td>不限</td>\n",
       "      <td>实习</td>\n",
       "      <td>数据分析</td>\n",
       "      <td>NaN</td>\n",
       "      <td>第五届泰迪杯数据分析技能赛:特等奖</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1637791761638227968</td>\n",
       "      <td>2000-02-14</td>\n",
       "      <td>随时到岗</td>\n",
       "      <td>中共党员</td>\n",
       "      <td>啥都会</td>\n",
       "      <td>互联网|电子商务|金融</td>\n",
       "      <td>全职</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1641058737659707392</td>\n",
       "      <td>2002-01-23</td>\n",
       "      <td>1周后到岗</td>\n",
       "      <td>中共党员</td>\n",
       "      <td>爱好</td>\n",
       "      <td>金融|电子商务|媒体</td>\n",
       "      <td>实习</td>\n",
       "      <td>你好| 邯郸</td>\n",
       "      <td>计算机|埃森哲|领导|2023-03-01|2023-03-05|None|None</td>\n",
       "      <td>第六届泰迪杯数据挖掘挑战赛:创新奖</td>\n",
       "      <td>...</td>\n",
       "      <td>北京大学</td>\n",
       "      <td>None</td>\n",
       "      <td>硕士</td>\n",
       "      <td>2021-02-04</td>\n",
       "      <td>2023-07-06</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1634019092572798976</td>\n",
       "      <td>2023-02-07</td>\n",
       "      <td>随时到岗</td>\n",
       "      <td>团员</td>\n",
       "      <td>无</td>\n",
       "      <td>互联网</td>\n",
       "      <td>实习</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10864</th>\n",
       "      <td>7539911453372509716</td>\n",
       "      <td>1993-02-09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10865</th>\n",
       "      <td>7539911474847346196</td>\n",
       "      <td>1993-08-22</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10866</th>\n",
       "      <td>7539911492027215380</td>\n",
       "      <td>1993-03-04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10867</th>\n",
       "      <td>7539911483437280788</td>\n",
       "      <td>1994-11-24</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10868</th>\n",
       "      <td>7539911500617149972</td>\n",
       "      <td>1995-08-08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>10869 rows × 29 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                  resumeId    birthday arrivalTime politicalStatus  \\\n",
       "0      1637801716407730176  2019-03-05         NaN          中共预备党员   \n",
       "1      1635610357617786880  2002-03-02        时间待议              团员   \n",
       "2      1637791761638227968  2000-02-14        随时到岗            中共党员   \n",
       "3      1641058737659707392  2002-01-23       1周后到岗            中共党员   \n",
       "4      1634019092572798976  2023-02-07        随时到岗              团员   \n",
       "...                    ...         ...         ...             ...   \n",
       "10864  7539911453372509716  1993-02-09         NaN             NaN   \n",
       "10865  7539911474847346196  1993-08-22         NaN             NaN   \n",
       "10866  7539911492027215380  1993-03-04         NaN             NaN   \n",
       "10867  7539911483437280788  1994-11-24         NaN             NaN   \n",
       "10868  7539911500617149972  1995-08-08         NaN             NaN   \n",
       "\n",
       "      selfEvaluation expectIndustry willNature keywordList  \\\n",
       "0                啥都会            NaN         全职         NaN   \n",
       "1        Python 数据分析             不限         实习        数据分析   \n",
       "2                啥都会    互联网|电子商务|金融         全职         NaN   \n",
       "3                 爱好     金融|电子商务|媒体         实习      你好| 邯郸   \n",
       "4                  无            互联网         实习         NaN   \n",
       "...              ...            ...        ...         ...   \n",
       "10864            NaN            互联网        NaN         NaN   \n",
       "10865            NaN            互联网        NaN         NaN   \n",
       "10866            NaN            互联网        NaN         NaN   \n",
       "10867            NaN            互联网        NaN         NaN   \n",
       "10868            NaN            互联网        NaN         NaN   \n",
       "\n",
       "                            projectExperienceList competitionExperienceList  \\\n",
       "0                                             NaN                       NaN   \n",
       "1                                             NaN         第五届泰迪杯数据分析技能赛:特等奖   \n",
       "2                                             NaN                       NaN   \n",
       "3      计算机|埃森哲|领导|2023-03-01|2023-03-05|None|None         第六届泰迪杯数据挖掘挑战赛:创新奖   \n",
       "4                                             NaN                       NaN   \n",
       "...                                           ...                       ...   \n",
       "10864                                         NaN                       NaN   \n",
       "10865                                         NaN                       NaN   \n",
       "10866                                         NaN                       NaN   \n",
       "10867                                         NaN                       NaN   \n",
       "10868                                         NaN                       NaN   \n",
       "\n",
       "       ...   学校1   专业1  学位1       起始时间1       毕业时间1  学校2  专业2  学位2 起始时间2 毕业时间2  \n",
       "0      ...   NaN   NaN  NaN         NaN         NaN  NaN  NaN  NaN   NaN   NaN  \n",
       "1      ...   NaN   NaN  NaN         NaN         NaN  NaN  NaN  NaN   NaN   NaN  \n",
       "2      ...   NaN   NaN  NaN         NaN         NaN  NaN  NaN  NaN   NaN   NaN  \n",
       "3      ...  北京大学  None   硕士  2021-02-04  2023-07-06  NaN  NaN  NaN   NaN   NaN  \n",
       "4      ...   NaN   NaN  NaN         NaN         NaN  NaN  NaN  NaN   NaN   NaN  \n",
       "...    ...   ...   ...  ...         ...         ...  ...  ...  ...   ...   ...  \n",
       "10864  ...   NaN   NaN  NaN         NaN         NaN  NaN  NaN  NaN   NaN   NaN  \n",
       "10865  ...   NaN   NaN  NaN         NaN         NaN  NaN  NaN  NaN   NaN   NaN  \n",
       "10866  ...   NaN   NaN  NaN         NaN         NaN  NaN  NaN  NaN   NaN   NaN  \n",
       "10867  ...   NaN   NaN  NaN         NaN         NaN  NaN  NaN  NaN   NaN   NaN  \n",
       "10868  ...   NaN   NaN  NaN         NaN         NaN  NaN  NaN  NaN   NaN   NaN  \n",
       "\n",
       "[10869 rows x 29 columns]"
      ]
     },
     "execution_count": 53,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "PeopleDetail"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>enterpriseId</th>\n",
       "      <th>logo</th>\n",
       "      <th>shortName</th>\n",
       "      <th>industry</th>\n",
       "      <th>econKind</th>\n",
       "      <th>registCapi</th>\n",
       "      <th>personScope</th>\n",
       "      <th>email</th>\n",
       "      <th>phone</th>\n",
       "      <th>introduction</th>\n",
       "      <th>recruitJobNum</th>\n",
       "      <th>totalPublicJobNum</th>\n",
       "      <th>provinceCode</th>\n",
       "      <th>cityCode</th>\n",
       "      <th>regionCode</th>\n",
       "      <th>detailedAddress</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1599949909698674688</td>\n",
       "      <td>NaN</td>\n",
       "      <td>极能信息</td>\n",
       "      <td>互联网|大数据</td>\n",
       "      <td>民营公司</td>\n",
       "      <td>100万元以内</td>\n",
       "      <td>少于50人</td>\n",
       "      <td>563398058@qq.com</td>\n",
       "      <td>020-87359876</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>广东省</td>\n",
       "      <td>广州市</td>\n",
       "      <td>黄埔区</td>\n",
       "      <td>广州市黄埔区起云路8号5栋418房</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1604719759373500416</td>\n",
       "      <td>/co91511500MABYFR1W1J/1671432723968/1671432723...</td>\n",
       "      <td>四川中软国际</td>\n",
       "      <td>互联网|软件</td>\n",
       "      <td>上市公司</td>\n",
       "      <td>1000万以上</td>\n",
       "      <td>500-1000人</td>\n",
       "      <td>liaohang@chinasofti.com</td>\n",
       "      <td>13123678906</td>\n",
       "      <td>NaN</td>\n",
       "      <td>4</td>\n",
       "      <td>4</td>\n",
       "      <td>四川省</td>\n",
       "      <td>宜宾市</td>\n",
       "      <td>翠屏区</td>\n",
       "      <td>四川省宜宾市临港经济开发区开区白沙湾街道国兴大道沙坪路段9号数据中心801-32号</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1603243973072257024</td>\n",
       "      <td>/co91110105674298552K/1671433239977/1671433239...</td>\n",
       "      <td>悠易互通</td>\n",
       "      <td>互联网|广告</td>\n",
       "      <td>民营公司</td>\n",
       "      <td>1000万以上</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>admin@yoyi.com.cn</td>\n",
       "      <td>13921667896</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>北京市</td>\n",
       "      <td>北京市</td>\n",
       "      <td>NaN</td>\n",
       "      <td>北京市朝阳区光华东里8号院3号楼11层1101内05、06、08、09、10、11、12、1...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1602499923595624448</td>\n",
       "      <td>/co913501006113010212/1670900910550/1670900910...</td>\n",
       "      <td>中电福富</td>\n",
       "      <td>互联网|大数据</td>\n",
       "      <td>民营公司</td>\n",
       "      <td>1000万以上</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>120938463058@qq.com</td>\n",
       "      <td>15915760454</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>福建省</td>\n",
       "      <td>福州市</td>\n",
       "      <td>NaN</td>\n",
       "      <td>福州市鼓楼区软件大道509号</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1507192012301008896</td>\n",
       "      <td>/admin/fd700d14-9b0c-18bc-ae22-3ade75207d54/fd...</td>\n",
       "      <td>海柔创新科技</td>\n",
       "      <td>电子商务|互联网</td>\n",
       "      <td>合资</td>\n",
       "      <td>1000万以上</td>\n",
       "      <td>150-500人</td>\n",
       "      <td>hairouchuangxin@tipdm.com</td>\n",
       "      <td>0755-23208112</td>\n",
       "      <td>深圳市海柔创新科技有限公司(HAI ROBOTICS CO., LTD.)，始于2016年深...</td>\n",
       "      <td>3</td>\n",
       "      <td>3</td>\n",
       "      <td>广东省</td>\n",
       "      <td>深圳市</td>\n",
       "      <td>宝安区</td>\n",
       "      <td>西乡街道南昌社区安络科技产业园B栋201、301、401</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>556</th>\n",
       "      <td>1505827247335014400</td>\n",
       "      <td>/佛山市小羽科技有限公司/4154-16478520jpg/16478520.jpg</td>\n",
       "      <td>佛山小羽智能科技</td>\n",
       "      <td>电子商务|互联网</td>\n",
       "      <td>合资</td>\n",
       "      <td>200-500万</td>\n",
       "      <td>50-100人</td>\n",
       "      <td>xiaoyu@tipdm.com</td>\n",
       "      <td>13632902552</td>\n",
       "      <td>佛山市小羽智能科技有限公司成立于2021-01-18，法定代表人为徐化夷，注册资本为444....</td>\n",
       "      <td>5</td>\n",
       "      <td>5</td>\n",
       "      <td>广东省</td>\n",
       "      <td>佛山市</td>\n",
       "      <td>南海区</td>\n",
       "      <td>狮山镇软件园桃园路南海产业智库城一期B座B611室之二(住所申报)</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>557</th>\n",
       "      <td>1491291815121387520</td>\n",
       "      <td>/泰盈科技/10142-logojpg/logo.jpg</td>\n",
       "      <td>泰盈科技</td>\n",
       "      <td>人力资源服务|企业服务</td>\n",
       "      <td>合资</td>\n",
       "      <td>1000万以上</td>\n",
       "      <td>150-500人</td>\n",
       "      <td>taiyingkeji@tipdm.com</td>\n",
       "      <td>0757-63509066</td>\n",
       "      <td>广东泰盈科技有限公司成立于2018-09-06，法定代表人为王志利，注册资本为1000万元...</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>广东省</td>\n",
       "      <td>佛山市</td>\n",
       "      <td>南海区</td>\n",
       "      <td>桂城街道融和路25号荣耀国际金融中心4层401-408室(住所申报)</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>558</th>\n",
       "      <td>1476026460258041857</td>\n",
       "      <td>NaN</td>\n",
       "      <td>朗新科技</td>\n",
       "      <td>互联网</td>\n",
       "      <td>合资</td>\n",
       "      <td>NaN</td>\n",
       "      <td>50-100人</td>\n",
       "      <td>ntpt106@tipdm.com</td>\n",
       "      <td>0510-66676999</td>\n",
       "      <td>NaN</td>\n",
       "      <td>2</td>\n",
       "      <td>2</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>559</th>\n",
       "      <td>1493063267566878720</td>\n",
       "      <td>/京东信息/43591-164480911png/164480911.png</td>\n",
       "      <td>京东信息</td>\n",
       "      <td>电子商务|互联网</td>\n",
       "      <td>上市公司</td>\n",
       "      <td>1000万以上</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>jingdongxinxi@tipdm.com</td>\n",
       "      <td>0527-87026126</td>\n",
       "      <td>江苏京东信息技术有限公司成立于2009-06-16，法定代表人为曹珂，注册资本为2000万...</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>江苏省</td>\n",
       "      <td>宿迁市</td>\n",
       "      <td>宿豫区</td>\n",
       "      <td>洪泽湖东路与清水江路交叉口</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>560</th>\n",
       "      <td>1518408399195340800</td>\n",
       "      <td>/91310000734084709Q/1650852186157/165085218615...</td>\n",
       "      <td>鼎捷软件</td>\n",
       "      <td>互联网|金融</td>\n",
       "      <td>民营公司</td>\n",
       "      <td>1000万以上</td>\n",
       "      <td>500-1000人</td>\n",
       "      <td>lijund@digiwin.com</td>\n",
       "      <td>021-51791688</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1</td>\n",
       "      <td>1</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>广东省广州市</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>561 rows × 16 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "            enterpriseId                                               logo  \\\n",
       "0    1599949909698674688                                                NaN   \n",
       "1    1604719759373500416  /co91511500MABYFR1W1J/1671432723968/1671432723...   \n",
       "2    1603243973072257024  /co91110105674298552K/1671433239977/1671433239...   \n",
       "3    1602499923595624448  /co913501006113010212/1670900910550/1670900910...   \n",
       "4    1507192012301008896  /admin/fd700d14-9b0c-18bc-ae22-3ade75207d54/fd...   \n",
       "..                   ...                                                ...   \n",
       "556  1505827247335014400         /佛山市小羽科技有限公司/4154-16478520jpg/16478520.jpg   \n",
       "557  1491291815121387520                       /泰盈科技/10142-logojpg/logo.jpg   \n",
       "558  1476026460258041857                                                NaN   \n",
       "559  1493063267566878720             /京东信息/43591-164480911png/164480911.png   \n",
       "560  1518408399195340800  /91310000734084709Q/1650852186157/165085218615...   \n",
       "\n",
       "    shortName     industry econKind registCapi personScope  \\\n",
       "0        极能信息      互联网|大数据     民营公司    100万元以内       少于50人   \n",
       "1      四川中软国际       互联网|软件     上市公司    1000万以上   500-1000人   \n",
       "2        悠易互通       互联网|广告     民营公司    1000万以上    10000人以上   \n",
       "3        中电福富      互联网|大数据     民营公司    1000万以上    10000人以上   \n",
       "4      海柔创新科技     电子商务|互联网       合资    1000万以上    150-500人   \n",
       "..        ...          ...      ...        ...         ...   \n",
       "556  佛山小羽智能科技     电子商务|互联网       合资   200-500万     50-100人   \n",
       "557      泰盈科技  人力资源服务|企业服务       合资    1000万以上    150-500人   \n",
       "558      朗新科技          互联网       合资        NaN     50-100人   \n",
       "559      京东信息     电子商务|互联网     上市公司    1000万以上    10000人以上   \n",
       "560      鼎捷软件       互联网|金融     民营公司    1000万以上   500-1000人   \n",
       "\n",
       "                         email          phone  \\\n",
       "0             563398058@qq.com   020-87359876   \n",
       "1      liaohang@chinasofti.com    13123678906   \n",
       "2            admin@yoyi.com.cn    13921667896   \n",
       "3          120938463058@qq.com    15915760454   \n",
       "4    hairouchuangxin@tipdm.com  0755-23208112   \n",
       "..                         ...            ...   \n",
       "556           xiaoyu@tipdm.com    13632902552   \n",
       "557      taiyingkeji@tipdm.com  0757-63509066   \n",
       "558          ntpt106@tipdm.com  0510-66676999   \n",
       "559    jingdongxinxi@tipdm.com  0527-87026126   \n",
       "560         lijund@digiwin.com   021-51791688   \n",
       "\n",
       "                                          introduction  recruitJobNum  \\\n",
       "0                                                  NaN              1   \n",
       "1                                                  NaN              4   \n",
       "2                                                  NaN              1   \n",
       "3                                                  NaN              1   \n",
       "4    深圳市海柔创新科技有限公司(HAI ROBOTICS CO., LTD.)，始于2016年深...              3   \n",
       "..                                                 ...            ...   \n",
       "556  佛山市小羽智能科技有限公司成立于2021-01-18，法定代表人为徐化夷，注册资本为444....              5   \n",
       "557   广东泰盈科技有限公司成立于2018-09-06，法定代表人为王志利，注册资本为1000万元...              2   \n",
       "558                                                NaN              2   \n",
       "559   江苏京东信息技术有限公司成立于2009-06-16，法定代表人为曹珂，注册资本为2000万...              1   \n",
       "560                                                NaN              1   \n",
       "\n",
       "     totalPublicJobNum provinceCode cityCode regionCode  \\\n",
       "0                    1          广东省      广州市        黄埔区   \n",
       "1                    4          四川省      宜宾市        翠屏区   \n",
       "2                    1          北京市      北京市        NaN   \n",
       "3                    1          福建省      福州市        NaN   \n",
       "4                    3          广东省      深圳市        宝安区   \n",
       "..                 ...          ...      ...        ...   \n",
       "556                  5          广东省      佛山市        南海区   \n",
       "557                  2          广东省      佛山市        南海区   \n",
       "558                  2          NaN      NaN        NaN   \n",
       "559                  1          江苏省      宿迁市        宿豫区   \n",
       "560                  1          NaN      NaN        NaN   \n",
       "\n",
       "                                       detailedAddress  \n",
       "0                                    广州市黄埔区起云路8号5栋418房  \n",
       "1            四川省宜宾市临港经济开发区开区白沙湾街道国兴大道沙坪路段9号数据中心801-32号  \n",
       "2    北京市朝阳区光华东里8号院3号楼11层1101内05、06、08、09、10、11、12、1...  \n",
       "3                                       福州市鼓楼区软件大道509号  \n",
       "4                         西乡街道南昌社区安络科技产业园B栋201、301、401  \n",
       "..                                                 ...  \n",
       "556                  狮山镇软件园桃园路南海产业智库城一期B座B611室之二(住所申报)  \n",
       "557                 桂城街道融和路25号荣耀国际金融中心4层401-408室(住所申报)  \n",
       "558                                                NaN  \n",
       "559                                      洪泽湖东路与清水江路交叉口  \n",
       "560                                             广东省广州市  \n",
       "\n",
       "[561 rows x 16 columns]"
      ]
     },
     "execution_count": 51,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "_ = pd.read_csv(\"../Data/ProcessData/CompanyDetail.csv\")\n",
    "_"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.1"
  },
  "orig_nbformat": 4
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
